Overview

Dataset Statistics

Number of Features 21
Number of Rows 14461760

Features Statistics

feature name feature type unique values description
text_tokens text 8655717/14461760 {'unique': 8655717, 'top': '101\t100\t102', 'freq': 58093}
hashtags {'is_string': True} 799316/14461760 {'unique': 799316, 'top': 'A338C5C1637BEDA847BC1237241145BC', 'freq': 66849}
tweet_id {'is_string': True} 10281499/14461760 {'unique': 10281499, 'top': 'E77466CC1BD39E3F1B1FDEC5EB2D1C4D', 'freq': 1192}
present_media {'is_string': True} 18/14461760 {'unique': 18, 'top': 'Photo', 'freq': 2974612}
present_links {'is_string': True} 911887/14461760 {'unique': 911887, 'top': 'C7706D041E70CEBDCE3BDF69590BF99C', 'freq': 2491}
present_domains {'is_string': True} 119892/14461760 {'unique': 119892, 'top': 'F595B7DE8992A3D8C7948B4E81419D78', 'freq': 142378}
tweet_type {'is_string': True} 3/14461760 {'unique': 3, 'top': 'TopLevel', 'freq': 8776383}
language {'is_string': True} 66/14461760 {'unique': 66, 'top': '488B32D24BD4BB44172EB981C1BCA6FA', 'freq': 5465361}
tweet_timestamp {'is_string': True} 604800/14461760 {'unique': 604800, 'top': '2021-02-27 15:00:01', 'freq': 1502}
engaged_with_user_id {'is_string': True} 3575965/14461760 {'unique': 3575965, 'top': 'E9DD2A9AA5584BA1676200FC307AD812', 'freq': 14771}
engaged_with_user_follower_count {'is_integer': True, 'is_numeric': True} 135742/14461760 {'mean': 956462.918704639, 'std': 5044897.885428854, 'min': 1.0, '25%': 1581.0, '50%': 14328.0, '75%': 189523.0, 'max': 129448458.0}
engaged_with_user_following_count {'is_integer': True, 'is_numeric': True} 35636/14461760 {'mean': 4402.458133657314, 'std': 35641.3635287107, 'min': 0.0, '25%': 219.0, '50%': 645.0, '75%': 1788.0, 'max': 4253259.0}
engaged_with_user_is_verified {'is_integer': True, 'is_numeric': True} 2/14461760 {'mean': 0.23367280331024717, 'std': 0.42316644087838146, 'min': 0.0, '25%': 0.0, '50%': 0.0, '75%': 0.0, 'max': 1.0}
engaged_with_user_account_creation {'is_string': True} 3553680/14461760 {'unique': 3553680, 'top': '2020-11-25 15:27:39', 'freq': 14771}
engaging_user_id {'is_string': True} 6161080/14461760 {'unique': 6161080, 'top': 'A7A011A51139BEBF2F415053BD1A7E77', 'freq': 181}
engaging_user_follower_count {'is_integer': True, 'is_numeric': True} 39504/14461760 {'mean': 1025.1536239019317, 'std': 19024.37964662244, 'min': 0.0, '25%': 57.0, '50%': 204.0, '75%': 627.0, 'max': 18290923.0}
enaging_user_following_count {'is_integer': True, 'is_numeric': True} 19969/14461760 {'mean': 859.5990557165933, 'std': 2224.6403751529906, 'min': 1.0, '25%': 172.0, '50%': 391.0, '75%': 888.0, 'max': 1604778.0}
enaging_user_is_verified {'is_integer': True, 'is_numeric': True} 2/14461760 {'mean': 0.0019555711061447567, 'std': 0.0441785805877998, 'min': 0.0, '25%': 0.0, '50%': 0.0, '75%': 0.0, 'max': 1.0}
engaging_user_account_creation {'is_string': True} 6085624/14461760 {'unique': 6085624, 'top': '2019-10-29 16:18:27', 'freq': 181}
engagee_follows_engager {'is_integer': True, 'is_numeric': True} 2/14461760 {'mean': 0.34926419744208176, 'std': 0.47673759401064836, 'min': 0.0, '25%': 0.0, '50%': 0.0, '75%': 1.0, 'max': 1.0}
reply {'is_integer': True, 'is_numeric': True} 2/14461760 {'mean': 0.021059746531542495, 'std': 0.1435835472229967, 'min': 0.0, '25%': 0.0, '50%': 0.0, '75%': 0.0, 'max': 1.0}

Interactions